% ------------------------------------------------------------------------
% SAMPLE BIBLIOGRAPHY FILE
% ------------------------------------------------------------------------

@Article{Nadas1983,
  title =	"A decision theorectic formulation of a training problem in speech recognition and a comparison of training by unconditional versus conditional maximum likelihood",
  author =	"A. Nadas",
  journal =	"IEEE Transactions on Acoustics, Speech and Signal Processing",
  year =	"1983",
  volume =	"31(4)",
  pages =	"814--817",
}

@Article{JK1992,
  author =	"B.-H. Juang and S. Katagiri",
  title =	"Discriminative Learning for Minimum Error Classification",
  journal =	"IEEE Transactions on Signal Processing",
  year = 	"1992",
  volume =	"40",
  number =	"12",
  pages =	"3043--3054",
}

@Article{WoodlandP02,
  title =	"Large scale discriminative training of hidden Markov models for speech recognition",
  author =	"Philip C. Woodland and Daniel Povey",
  journal =	"Computer Speech and Language",
  year = 	"2002",
  number =	"1",
  volume =	"16",
  bibdate =	"2007-03-05",
  bibsource =	"DBLP, http://dblp.uni-trier.de/db/journals/csl/csl16.html#WoodlandP02",
  pages =	"25--47",
  URL =  	"http://dx.doi.org/10.1006/csla.2001.0182",
}

@Book{Dan2003,
  author =	"Daniel Povey",
  year = 	"2003",
  title =	"Discriminative training for large vocabulary speech recognition",
  publisher =	"PhD thesis, Cambridge University",
}

@conference{RM2005,
  title =	"Optimization methods discriminative training",
  author =	"J.L.Roux and E.McDermott",
  year = 	"2005",
  booktile =	"Proc. Eurospeech",
  pages =	"3341--3344",
  address=	"Lisbon, Portgual",
}

@Book{Vapnik1998,
  author =	"V. Vapnik",
  year = 	"1998",
  title =	"Statistical learning theory",
  publisher =	"Wiley, N.Y., 1998",
}

@Book{Fei2007,
  author =	"F. Sha",
  year = 	"2007",
  title =	"Large margin training of acoustic models for speech recognition",
  publisher =	"PhD thesis, University of Pennsylvania",
}

@book{BourlardM1993,
    address = {Norwell, MA, USA},
    author = {Bourlard, Herve A. and Morgan, Nelson},
    citeulike-article-id = {3079067},
    citeulike-linkout-0 = {http://portal.acm.org/citation.cfm?id=562393},
    isbn = {0792393961},
    keywords = {bayesian, hidden-markov-model, neural-network, temporal-processing},
    posted-at = {2008-08-03 23:43:49},
    priority = {2},
    publisher = {Kluwer Academic Publishers},
    title = {Connectionist Speech Recognition: A Hybrid Approach},
    url = {http://portal.acm.org/citation.cfm?id=562393},
    year = {1993},
}

@Article{WFST02,
  title =	"Weighted Finite-State Transducers in Speech Recognition",
  author =	"Mehryar Mohri, Fernando C. N. Pereira, and Michael Riley",
  journal =	"Computer Speech \& Language",
  year = 	"2002",
  number =	"1",
  volume =	"16",
}

@Article{WFST08,
  title =	"Speech recognition with weighted finite-state transducers",
  author =	"Mehryar Mohri, Fernando C. N. Pereira, and Michael Riley",
  journal =	"Larry Rabiner and Fred Juang, editors, Handbook on Speech Processing and Speech Communication, Part E: Speech recognition",
  year = 	"2008",
  publisher =	"Springer-Verlag, Heidelberg, Germany",
}

@Article{Baker1975,
  author =	"J. Baker",
  year = 	"1975",
  title =	"The {D}ragon system---an overview",
  journal =	"Proc. ICASSP '75",
  volume =	"23",
}

@Article{BaumEagon1967,
  author =	"L.~E. Baum and J.~A. Eagon",
  title =	"An inequality with applications to statistical
		 estimation for probabilistic functions of Markov
		 processes and to a model for ecology.",
  journal =	"Bulletin of American Mathematical Society",
  year = 	"1967",
  volume =	"73",
  pages =	"360--363",
}

@Article{Jelinek1976,
  author =	"F. Jelinek",
  title =	"Continuous speech recognition by statistical methods",
  journal =	"Proceedings of the {IEEE}",
  year = 	"1976",
  volume =	"64",
  number =	"4",
  pages =	"532--556",
}

@Article{JuangLS1986,
  title =	"Maximum likelihood estimation for multivariate mixture
		 observations of markov chains",
  author =	"Bing-Hwang Juang and Stephen E. Levinson and M. Mohan
		 Sondhi",
  journal =	"IEEE Transactions on Information Theory",
  year = 	"1986",
  number =	"2",
  volume =	"32",
  bibdate =	"2005-02-28",
  bibsource =	"DBLP,
		 http://dblp.uni-trier.de/db/journals/tit/tit32.html#JuangLS86",
  pages =	"307",
}

@Article{Baum1970,
  title =	"A maximization technique occurring in the statistical analysis of probabilistic functions of markov chains",
  author =	"L. E. Baum, T. Petrie, G. Soules, and N. Weiss",
  journal =	"The Annals of Mathematical Statistics",
  year = 	"1970",
  number =	"1",
  volume =	"41",
  pages =	"164-171",
}
@TechReport{Fahlman1988,
  title =	"An empirical study of learning speed in back-propagation networks",
  author =	"S. E. Fahlman",
  institution =	"Canergie Mellon University",
  year = 	"1988",
}
@article{Bourlard1990,
author = {H. Bourlard and C.J. Wellekens},
title = {Links Between Markov Models and Multilayer Perceptrons},
journal ={IEEE Transactions on Pattern Analysis and Machine Intelligence},
volume = {12},
issn = {0162-8828},
year = {1990},
pages = {1167-1178},
doi = {http://doi.ieeecomputersociety.org/10.1109/34.62605},
publisher = {IEEE Computer Society},
address = {Los Alamitos, CA, USA},
}
@conference{Gish1990,
  title =	"A probabilistic approach to the understanding and training of neural network classifiers ",
  author =	"H. Gish",
  year = 	"1990",
  booktile =	"Proc. Int. Conf. on Acoustic, Speech, and Signal Processing",
  pages =	"1361--1364",
  address=	"Albuquerque, NM",
}
@article{GopalakrishnanKNN91,
  author    = {P. S. Gopalakrishnan and
               Dimitri Kanevsky and
               Arthur N{\'a}das and
               David Nahamoo},
  title     = {An inequality for rational functions with applications to
               some statistical estimation problems},
  journal   = {IEEE Transactions on Information Theory},
  volume    = {37},
  number    = {1},
  year      = {1991},
  pages     = {107-113},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}
@article{WoodlandP02,
  author    = {Philip C. Woodland and
               Daniel Povey},
  title     = {Large scale discriminative training of hidden Markov models
               for speech recognition},
  journal   = {Computer Speech {\&} Language},
  volume    = {16},
  number    = {1},
  year      = {2002},
  pages     = {25-47},
  ee        = {http://dx.doi.org/10.1006/csla.2001.0182},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}
@article{McDermottHRNK07,
  author    = {Erik McDermott and
               Timothy J. Hazen and
               Jonathan Le Roux and
               Atsushi Nakamura and
               Shigeru Katagiri},
  title     = {Discriminative Training for Large-Vocabulary Speech Recognition
               Using Minimum Classification Error},
  journal   = {IEEE Transactions on Audio, Speech {\&} Language Processing},
  volume    = {15},
  number    = {1},
  year      = {2007},
  pages     = {203-223},
  ee        = {http://dx.doi.org/10.1109/TASL.2006.876778},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}
@InProceedings{watrous-shastri-87,
  key =  	"Watrous",
  author =	"R.~L. Watrous and L. Shastri",
  title =	"Learning Phonetic Features Using Connectionist
		 Networks: An Experiment in Speech Recognition",
  booktitle =	"IEEE International Conference on Neural Networks",
  month =	jun,
  year = 	"1987",
}
@article{PeelingM88,
 author = {Peeling, S. M. and Moore, R. K.},
 title = {Isolated digit recognition experiments using the multi-layer perceptron},
 journal = {Speech Commun.},
 volume = {7},
 number = {4},
 year = {1988},
 issn = {0167-6393},
 pages = {403--409},
 doi = {http://dx.doi.org/10.1016/0167-6393(88)90057-X},
 publisher = {Elsevier Science Publishers B. V.},
 address = {Amsterdam, The Netherlands, The Netherlands},
 }
@InProceedings{WaibelHHSL88,
  author =	"A. Waibel and T. Hanazawa and G. Hinton and K. Shikano and K. Lang",
  title =	"Phoneme recognition: neural networks vs. hidden Markov models vs.hidden Markov models",
  booktitle =	"Proc. ICASSP '88",
  year = 	"1988",
  pages =	"107--110",
  volume = "1",
  month = "Apr",
}
@TechReport{Parker1982,
  author =	"D. B. Parker",
  title =	"Learning Logic, Invention Report",
  institution =  "Office of Technology Licencing, Stanford University",
  year = 	"1982",
  month =	oct,
  number =	"S81--64, File 1",
}
@TechReport{Parker1985,
  author =	"D. Parker",
  title =	"Learning-Logic",
  institution = 	"TR-47, Center for Computational Research
		 in Economics and Management Science, MIT, MA",
  year = 	"1985",
}
@Book{Rosenblatt1961,
  author =	"F. Rosenblatt",
  title =	"Principles of Neurodynamics: Perceptrons and the
		 Theory of Brain Mechanisms",
  publisher =	"Spartan Books",
  year = 	"1961",
  address =	"Washington DC",
}
@InCollection{RumelhartHW86,
  editor =	"D. E. Rumelhart and J. L. McClelland and the PDP
		 research group.",
  year = 	"1986",
  booktitle =	"Parallel distributed processing: Explorations in the
		 microstructure of cognition, Volume 1: Foundations",
  publisher =	"MIT Press",
  author =	"David E. Rumelhart and Geoffrey E. Hinton and R. J.
		 Williams",
  title =	"Learning Internal Representations by Error
		 Propagation",
  keywords =	"backpropagation, learning algorithms, internal
		 representations",
}
@InProceedings{Juang1992,
  author =	"W. Chou, B. -H. Juang and C. -H. Lee",
  title =	"Segmental GPD training of HMM based speech recognizer",
  booktitle =	"Proc. ICASSP 1992",
  year = 	"1992",
  pages =	"473-476",
  volume = "40",
  month = "Dec",
}
@InProceedings{Sha2006,
  author =	"F. Sha and L. K. Saul",
  title =	"Large Margin Gaussian mixture modelling for phonetic classification and recognition",
  booktitle =	"Proc. ICASSP 2006",
  year = 	"2006",
  pages =	"265-268",
}
@article{Cybenko89,
 author = {G. Cybenko},
 title = {Approximation by superpositions of a sigmoidal function},
 journal = {Mathematics of Control, Signals, and Systems (MCSS)},
 volume = {2},
 number = {4},
 year = {1989},
 pages = {303--314},
 publisher = {Elsevier Science Publishers B. V.},
 }
@article{Poggio89,
 author = {T. Poggio and F. Girosi},
 title = {Networks for approximation and learning},
 journal = {Proc. IEEE},
 volume = {78},
 year = {1989},
 pages = {1481--1497},
 }
@InProceedings{Juang1997,
  author =	"B. -H. Juang, W. Chou, and C. -H. Lee",
  title =	"Minimum classification error rate methods for speech recognition",
  booktitle =	"IEEE Trans. on Speech and Audio Processing",
  year = 	"1997",
  volume = "5",
  number = "3"
  month = "Dec",
}
@InProceedings{Povey2002,
  author =	"Povey, D., Woodland, P.C.",
  title =	"Minimum phone error and I-smoothing for improved discriminative training",
  booktitle =	"Proc., ICASSP 2002",
  year = 	"2002",
}
@Book{aho1974,
  author =	"Aho, A. V., Hopcroft, J. E. and Ullman, J. D",
  year = 	"1974",
  title =	"The Design and Analysis of Computer Algorithms",
  publisher =	"Addison Wesley, Reading, MA",
}
@Book{Hopcroft1979,
  author =	"A. V. Hopcroft, J. E. and Ullman, J. D",
  year = 	"1979",
  title =	"Introduction to Automata Theory, Language, and Computation",
  publisher =	"Addison Wesley, Reading, MA",
}
@INPROCEEDINGS{Riedmiller93adirect,
    author = {Martin Riedmiller and Heinrich Braun},
    title = {A Direct Adaptive Method for Faster Backpropagation Learning: The RPROP Algorithm},
    booktitle = {IEEE INTERNATIONAL CONFERENCE ON NEURAL NETWORKS},
    year = {1993},
    pages = {586--591},
    publisher = {}
}
@Book{HTK,
  author = "Steve Young, Gunnar Evermann, Mark Gales, Thomas Hain, Dan Kershaw, Xunying Liu, Gareth Moore, Hulian Odell, Dave Ollason, Dan Panvey, Valtcho Valtchev, and Phil Woodland",
  year = 	"2009",
  title =	"The HTK Book",
  publisher =	"Cambridge University Engineering Department",
}

@article{Atal71,
 author = {Atal BS, Hanauer SL},
 title = {Speech Analysis and Synthesis by Linear Prediction of the Speech Wave},
 journal = {Acoustical Society of America},
 volume = {50},
 year = {1971},
 pages = {637--655},
 }
@article{DavisMFCC,
    author = {Davis, S. and Mermelstein, P.},
    journal = {Acoustics, Speech, and Signal Processing [see also IEEE Transactions on Signal Processing], IEEE Transactions on},
    keywords = {mfcc, speech},
    number = {4},
    pages = {357--366},
    title = {Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences},
    volume = {28},
    year = {1980}
}
@article{HermanskyPLP,
 author = {Hynek Hermansky},
 title = {Perceptual linear predictive (PLP) analysis of speech},
 journal = {Acoustical Society of America},
 volume = {87},
 year = {1990},
 pages = {1738--1752},
 }
@INPROCEEDINGS{Rabiner89atutorial,
    author = {Lawrence R. Rabiner},
    title = {A tutorial on hidden markov models and selected applications in speech recognition},
    booktitle = {Proceedings of the IEEE},
    year = {1989},
    pages = {257--286}
}
@article{Valtchev1997303,
title = "MMIE training of large vocabulary recognition systems",
journal = "Speech Communication",
volume = "22",
number = "4",
pages = "303 - 314",
year = "1997",
note = "",
issn = "0167-6393",
doi = "DOI: 10.1016/S0167-6393(97)00029-0",
url = "http://www.sciencedirect.com/science/article/B6V1C-3WN74BD-1/2/af84170bff5009b7e1cd3f3a6b0db694",
author = "V. Valtchev and J. J. Odell and P. C. Woodland and S. J. Young"
}
